#pragma once

#include <string>

#include <http_client.h>

namespace tc = triton::client;

class LLM {
public:
    LLM();
    std::string chat(const std::string &prompt);

private:

private:
    std::string modelName_ = "llamacpp";
    std::string modelVersion_ = "";

    std::string httpServerUrl_ = "http://localhost:8000";
    std::unique_ptr<tc::InferenceServerHttpClient> httpClient_;
};